Packages and utilities

library(tidyverse)
Registered S3 methods overwritten by 'dbplyr':
  method         from
  print.tbl_lazy     
  print.tbl_sql      
── Attaching packages ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────── tidyverse 1.3.0 ──
✓ ggplot2 3.2.1     ✓ purrr   0.3.3
✓ tibble  2.1.3     ✓ dplyr   0.8.4
✓ tidyr   1.0.2     ✓ stringr 1.4.0
✓ readr   1.3.1     ✓ forcats 0.4.0
── Conflicts ──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────── tidyverse_conflicts() ──
x dplyr::filter() masks stats::filter()
x dplyr::lag()    masks stats::lag()
library(lme4)
Loading required package: Matrix

Attaching package: ‘Matrix’

The following objects are masked from ‘package:tidyr’:

    expand, pack, unpack
library(lmerTest)

Attaching package: ‘lmerTest’

The following object is masked from ‘package:lme4’:

    lmer

The following object is masked from ‘package:stats’:

    step
library(plotrix)
library(stringr)
library(readxl)
library(RColorBrewer)
library(mvtnorm)
library(mgcv)
Loading required package: nlme

Attaching package: ‘nlme’

The following object is masked from ‘package:lme4’:

    lmList

The following object is masked from ‘package:dplyr’:

    collapse

This is mgcv 1.8-31. For overview type 'help("mgcv-package")'.
# Compute the log-likelihood of a new dataset using a fit lme4 model.
logLik_test <- function(lm, test_X, test_y) {
  predictions <- predict(lm, test_X, re.form=NA)
  # Get std.dev. of residual, estimated from train data
  stdev <- sigma(lm)
  # For each prediction--observation, get the density p(obs | N(predicted, model_sigma)) and reduce
  density <- sum(dnorm(test_y, predictions, stdev, log=TRUE))
  return(density)
}
# Get per-prediction log-likelihood
logLik_test_per <- function(lm, test_X, test_y) {
  predictions <- predict(lm, test_X, re.form=NA)
  # Get std.dev. of residual, estimated from train data
  stdev <- sigma(lm)
  # For each prediction--observation, get the density p(obs | N(predicted, model_sigma))
  densities <- dnorm(test_y, predictions, stdev, log=TRUE)
  return(densities)
}
# Compute MSE of a new dataset using a fit lme4 model.
mse_test <- function(lm, test_X, test_y) {
  return(mean((predict(lm, test_X, re.form=NA) - test_y) ^ 2))
}
#Sanity checks
#mylm <- gam(psychometric ~  s(surprisal, bs = "cr", k = 20) + s(prev_surp, bs = "cr", k = 20) + te(freq, len, bs = "cr") + te(prev_freq, prev_len, bs = "cr"), data=train_data)
#c(logLik(mylm), logLik_test(mylm, train_data, train_data$psychometric))
#logLik_test(mylm, test_data, test_data$psychometric)

Data loading and preprocessing

data = read.csv("../data/harmonized_results.csv")

all_data = data %>%
  mutate(seed = as.factor(seed)) %>%
  group_by(corpus, model, training, seed) %>%
    mutate(prev_surp = lag(surprisal),
         prev_code = lag(code),
         prev_len = lag(len),
         prev_freq = lag(freq),
         prev_surp = lag(surprisal),
         
         prev2_freq = lag(prev_freq),
         prev2_code = lag(prev_code),
         prev2_len = lag(prev_len),
         prev2_surp = lag(prev_surp),
         
         prev3_freq = lag(prev2_freq),
         prev3_code = lag(prev2_code),
         prev3_len = lag(prev2_len),
         prev3_surp = lag(prev2_surp)) %>%
  ungroup() %>%
  # Filter back three for the dundee corpus. Filter back 1 for all other corpora
  filter((corpus == "dundee" & code == prev2_code + 2) | (corpus != "dundee" & code == prev_code + 1)) %>%
  select(-prev_code, -prev2_code, -prev3_code) %>%
  drop_na()

all_data = all_data %>%
  mutate(
    model = as.character(model),
    model = if_else(model == "gpt-2", "gpt2", model),
    model = as.factor(model))
# Compute linear model stats for the given training data subset and full test data.
# Automatically subsets the test data to match the relevant group for which we are training a linear model.
get_lm_data <- function(df, test_data, formula, fold, store_env) {
  #this_lm <- gam(formula, data=df);
  this_lm = lm(formula, data=df)
  this_test_data <- semi_join(test_data, df, by=c("training", "model", "seed", "corpus"));
  
  # Save lm to the global env so that we can access residuals later.
  lm_name = paste(unique(paste(df$model, df$training, df$seed, df$corpus))[1], fold)
  assign(lm_name, this_lm, envir=store_env)
  
  summarise(df,
            log_lik = as.numeric(logLik(this_lm, REML = F)),
            test_lik = logLik_test(this_lm, this_test_data, this_test_data$psychometric),
            test_mse = mse_test(this_lm, this_test_data, this_test_data$psychometric))
}
# For a previously fitted lm stored in store_env, get the residuals on test data of the relevant data subset.
get_lm_residuals <- function(df, fold, store_env) {
  # Retrieve the relevant lm.
  lm_name = paste(unique(paste(df$model, df$training, df$seed, df$corpus))[1], fold)
  this_lm <- get(lm_name, envir=store_env)
  
  mutate(df,
         likelihood = logLik_test_per(this_lm, df, df$psychometric),
         resid = df$psychometric - predict(this_lm, df, re.form=NA))
}
# Compute per-example delta-log-likelihood for the given test fold.
get_lm_delta_log_lik <- function(test_data, fold, baseline_env, full_env) {
  lm_name = paste(unique(paste(test_data$model, test_data$training, test_data$seed, test_data$corpus))[1], fold)
  baseline_lm <- get(lm_name, envir=baseline_env)
  full_lm <- get(lm_name, envir=full_env)
  
  delta_log_lik = logLik_test_per(full_lm, test_data, test_data$psychometric) - logLik_test_per(baseline_lm, test_data, test_data$psychometric)
  return(cbind(test_data, delta_log_lik=delta_log_lik))
}
#####
# Define regression formulae.
# Eye-tracking regression: only use surprisal and previous surprisal; SPRT regression: use 2-back features.
#baseline_rt_regression = psychometric ~ te(freq, len, bs = "cr") + te(prev_freq, prev_len, bs = "cr")
#baselie_sprt_regression = psychometric ~ te(freq, len, bs = "cr") + te(prev_freq, prev_len, bs = "cr") + te(prev2_freq, prev2_len, bs = "cr")
#full_rt_regression = (psychometric ~ s(surprisal, bs = "cr", k = 20) + s(prev_surp, bs = "cr", k = 20)
                     #+ te(freq, len, bs = "cr") + te(prev_freq, prev_len, bs = "cr"))
#full_sprt_regression = (psychometric ~ s(surprisal, bs = "cr", k = 20) + s(prev_surp, bs = "cr", k = 20) + s(prev2_surp, bs = "cr", k = 20)
                        #+ te(freq, len, bs = "cr") + te(prev_freq, prev_len, bs = "cr") + te(prev2_freq, prev2_len, bs = "cr"))

baseline_rt_regression = psychometric ~ freq + prev_freq + prev2_freq + prev3_freq + len + prev_len + prev2_len + prev3_len
baseline_sprt_regression = psychometric ~ freq + prev_freq + len + prev_len

full_rt_regression = psychometric ~ surprisal + prev_surp + prev2_surp + prev3_surp + freq + prev_freq + prev2_freq + prev3_freq + len + prev_len + prev2_len + prev3_len
full_sprt_regression = psychometric ~ surprisal + prev_surp + freq + prev_freq + len + prev_len
  
#####
# Prepare frames/environments for storing results/objects.
baseline_results = data.frame()
full_model_results = data.frame()
#baseline_residuals = data.frame()
#full_residuals = data.frame()
log_lik_deltas = data.frame()

#Randomly shuffle the data
all_data<-all_data[sample(nrow(all_data)),]
#Create K equally size folds
K = 5
folds <- cut(seq(1,nrow(all_data)),breaks=K,labels=FALSE)
#Perform 10 fold cross validation

# Fit models for some fold of the data.
baseline_corpus = function(corpus, df, test_data, fold, env) {
  if(corpus == "dundee") {
    get_lm_data(df, test_data, baseline_rt_regression, fold, env)
  } else {
    get_lm_data(df, test_data, baseline_sprt_regression, fold, env)
  }
}
full_model_corpus = function(corpus, df, test_data, fold, env) {
  if(corpus[1] == "dundee") {
    get_lm_data(df, test_data, full_rt_regression, fold, env)
  } else {
    get_lm_data(df, test_data, full_sprt_regression, fold, env)
  }
}

# Prepare a new Environment in which we store fitted LMs, which we'll query later for residuals and other metrics.
baseline_env = new.env()
full_env = new.env()

for(i in 1:K) { 
  #Segement your data by fold using the which() function 
  testIndexes <- which(folds==i, arr.ind=TRUE)
  test_data <- all_data[testIndexes, ]
  train_data <- all_data[-testIndexes, ]
  
  # Compute a baseline linear model for each model--training--seed--RT-corpus combination.
  baselines = train_data %>%
    group_by(model, training, seed, corpus) %>%
      print(model) %>%
      do(baseline_corpus(unique(.$corpus), ., test_data, i, baseline_env)) %>%
    ungroup() %>%
    mutate(seed = as.factor(seed),
           fold = i)
  
  baseline_results = rbind(baseline_results, baselines)
  
  # Compute a full linear model for each model--training--seed-RT-corpus combination
  full_models = train_data %>%
    group_by(model, training, seed, corpus) %>%
      do(full_model_corpus(unique(.$corpus), ., test_data, i, full_env)) %>%
    ungroup() %>%
    mutate(seed = as.factor(seed),
           fold = i)
  
  full_model_results = rbind(full_model_results, full_models)
  
  # Compute delta-log-likelihoods
  fold_log_lik_deltas = test_data %>%
    group_by(model, training, seed, corpus) %>%
      do(get_lm_delta_log_lik(., i, baseline_env, full_env)) %>%
    ungroup()

  log_lik_deltas = rbind(log_lik_deltas, fold_log_lik_deltas)
  
  # fold_baseline_residuals = test_data %>%
  #   group_by(model, training, seed, corpus) %>%
  #     do(get_lm_residuals(., i, baseline_env)) %>%
  #   ungroup()
  # 
  # baseline_residuals = rbind(baseline_residuals, fold_baseline_residuals)
  # 
  # fold_full_residuals = test_data %>%
  #   group_by(model, training, seed, corpus) %>%
  #     do(get_lm_residuals(., i, full_env)) %>%
  #   ungroup() 
  # 
  # full_residuals = rbind(full_residuals, fold_full_residuals)
}

|==========================================================================================================                                                                      | 60% ~2 s remaining     
|================================================================================================================                                                                | 64% ~1 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~1 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
|===========================================================================================                                                                                     | 52% ~2 s remaining     
|==============================================================================================                                                                                  | 53% ~2 s remaining     
|====================================================================================================                                                                            | 57% ~2 s remaining     
|==========================================================================================================                                                                      | 60% ~2 s remaining     
|================================================================================================================                                                                | 64% ~1 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~1 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     

|====================================================================================================                                                                            | 57% ~2 s remaining     
|==========================================================================================================                                                                      | 60% ~1 s remaining     
|================================================================================================================                                                                | 64% ~1 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~1 s remaining     
|=======================================================================================================================================================                         | 86% ~0 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~1 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
|================================================================================================================================================================================|100% ~0 s remaining     

|==========================================================================================================                                                                      | 60% ~1 s remaining     
|================================================================================================================                                                                | 64% ~1 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~1 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
|===================================================================================================================                                                             | 66% ~1 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~0 s remaining     
|=======================================================================================================================================================                         | 86% ~0 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     

|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~0 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
|=================================================================================================                                                                               | 55% ~2 s remaining     
|====================================================================================================                                                                            | 57% ~2 s remaining     
|==========================================================================================================                                                                      | 60% ~1 s remaining     
|================================================================================================================                                                                | 64% ~1 s remaining     
|===================================================================================================================                                                             | 66% ~1 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~1 s remaining     
|=======================================================================================================================================================                         | 86% ~1 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     

|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~0 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
|======================================================================================================================                                                          | 67% ~1 s remaining     
|============================================================================================================================                                                    | 71% ~1 s remaining     
|==================================================================================================================================                                              | 74% ~1 s remaining     
|========================================================================================================================================                                        | 78% ~1 s remaining     
|===========================================================================================================================================                                     | 79% ~1 s remaining     
|==============================================================================================================================================                                  | 81% ~1 s remaining     
|====================================================================================================================================================                            | 84% ~0 s remaining     
|==========================================================================================================================================================                      | 88% ~0 s remaining     
|================================================================================================================================================================                | 91% ~0 s remaining     
|======================================================================================================================================================================          | 95% ~0 s remaining     
|============================================================================================================================================================================    | 98% ~0 s remaining     
#write.csv(full_residuals, "../data/analysis_checkpoints/full_residuals.csv")
#write.csv(baseline_residuals, "../data/analysis_checkpoints/baseline_residuals.csv")
model_deltas = log_lik_deltas %>%
  group_by(model, training, seed, corpus) %>% 
  summarise(mean_delta_log_lik = mean(delta_log_lik),
            sem_delta_log_lik = sd(delta_log_lik) / sqrt(length(delta_log_lik)))
write.csv(full_model_results, "../data/analysis_checkpoints/full_model_result.csv")
write.csv(baseline_results, "../data/analysis_checkpoints/baseline_results.csv")
#full_model_results = read.csv("../data/analysis_checkpoints/ffull_model_results.csv")
#baseline_results = read.csv("../data/analysis_checkpoints/fbaseline_resultsb.csv")
metric <- "ΔLogLik"
#metric <- "-ΔMSE"

# # Select the relevant metric.
model_deltas = model_deltas %>%
    # Retrieve the current test metric
    mutate(delta_test_mean = mean_delta_log_lik,
           delta_test_sem = sem_delta_log_lik) %>%
    # mutate(delta_test_mean = mean_delta_mse,
    #        delta_test_sem = sem_delta_mse)
    
    # Remove the raw metrics.
    select(-mean_delta_log_lik, -sem_delta_log_lik,
           #-mean_delta_mse, -sem_delta_mse
           )
model_deltas
# Sanity check: training on train+test data should yield improved performance over training on just training data. (When evaluating on test data.)
# full_baselines = all_data %>%
#   group_by(model, training, seed, corpus) %>%
#   summarise(baseline_train_all_test_lik = logLik_test(lm(psychometric ~ len + freq + sent_pos, data=.), semi_join(test_data, ., by=c("training", "model", "seed", "corpus")), semi_join(test_data, ., by=c("training", "model", "seed", "corpus"))$psychometric)) %>%
#   ungroup()
# full_baselines
# 
# full_baselines %>%
#   right_join(baselines, by=c("seed", "training", "model", "corpus")) %>%
#   mutate(delta=baseline_train_all_test_lik-baseline_test_lik) %>%
#   select(-baseline_lik) # %>%
#   #select(-baseline_test_lik, -baseline_train_all_test_lik, -baseline_lik, -baseline_test_mse)

Load language model data (SyntaxGym, PPL)

language_model_data = read.csv("../data/model_metadata.csv") %>%
  mutate(model = as.character(model),
         model = if_else(model == "gpt-2", "gpt2", model),
         model = as.factor(model)) %>%
  mutate(train_size = case_when(str_starts(training, "bllip-lg") ~ 42,
                                str_starts(training, "bllip-md") ~ 15,
                                str_starts(training, "bllip-sm") ~ 5,
                                str_starts(training, "bllip-xs") ~ 1),
         
         # Training vocabulary usually covaries with the training corpus.
         # But BPE models share a vocabulary across training corpora.
         training_vocab=as.factor(ifelse(str_detect(training, "gptbpe"), "gptbpe", as.character(training)))
         ) %>%
  mutate(seed = as.factor(seed)) %>%
  select(-pid, -test_loss) %>%
  distinct(model, training, seed, .keep_all = TRUE)
table(language_model_data$seed)

         0        111        120        922       1111       3602       4301       7245       7877      28066      28068      44862      51272      64924 1581807512 1581807578 1581861474 1581955288 
         4          7          6          5          4          1          1          1          1          1          1          1          1          1          1          1          1          1 
1582126320 1586986276 1587139950 
         1          1          1 
table(model_deltas$seed)

       111        120        922       1111       3602       4301       7245       7877      28066      28068      44862      51272      64924 1581807512 1581807578 1581861474 1581955288 1582126320 
         6          6          6          8          2          2          2          2          2          2          2          2          2          2          2          2          2          2 
1586986276 1587139950 
         2          2 

First join delta-metric data with model auxiliary data.

model_deltas = model_deltas %>%
  merge(language_model_data, by = c("seed", "training", "model"), all=T) %>%
  drop_na()

model_deltas

Also join on the original linear model data, rather than collapsing to delta-metrics. This will support regressions later on that don’t collapse across folds.

Final data preprocessing

# Exclude ordered-neurons from all analyses.
model_deltas <- model_deltas %>%
  filter(model != "ordered-neurons")

Visualizations

Predictive power and SG

model_deltas %>%
  ggplot(aes(x=sg_score, y=delta_test_mean)) +
    geom_errorbar(aes(ymin=delta_test_mean-delta_test_sem, ymax=delta_test_mean+delta_test_sem)) +
    geom_smooth(method="lm", se=T) +
    geom_point(stat="identity", position="dodge", alpha=1, size=3, aes(color=training_vocab, shape=model)) +
    ylab(metric) +
    xlab("Syntax Generalization Score") +
    ggtitle("Syntactic Generalization vs. Predictive Power") +
    scale_color_manual(values = c("bllip-lg"="#440154FF",
                              "bllip-md"="#39568CFF",
                              "bllip-sm"="#1F968BFF",
                              "bllip-xs"="#73D055FF",
                              "gptbpe"="#888888")) +
    facet_grid(~corpus, scales="free") +
    theme(axis.text=element_text(size=14),
          strip.text.x = element_text(size=14),
          legend.text=element_text(size=14),
          axis.title=element_text(size=18),
          legend.position = "bottom")

#ggsave("./cogsci_images/sg_loglik.png",height=5,width=6)

Regression analyses

We control for effects of perplexity by relating the residuals of a performance ~ PPL regression to SG score.

# Prepare a residualized regression for x1 onto y, controlling for the effects of x2.
d_resid = model_deltas %>%
  drop_na() %>%
  
  # Residualize delta metric w.r.t PPL for each model--training--seed
  group_by(corpus) %>%
    mutate(resid.delta = resid(lm(delta_test_mean ~ training:test_ppl))) %>%
  ungroup() %>%
  
  # Residualize SG score w.r.t. PPL for each training vocabulary
  group_by(training_vocab) %>%
    # NB no need for training:ppl interaction, since we're within-group.
    mutate(resid.sg = resid(lm(sg_score ~ test_ppl))) %>%
  ungroup() %>%
  # Compute summary statistics across model--training--seed--corpus.
  group_by(model, training_vocab, corpus, seed) %>%
    summarise(resid.delta.mean = mean(resid.delta),
              resid.delta.sem = sd(resid.delta) / sqrt(length(resid.delta)),
              resid.sg.mean = mean(resid.sg),
              resid.sg.sem = sd(resid.sg) / sqrt(length(resid.sg)))
# Now plot residual vs SG
d_resid %>%
  #filter(corpus != "bnc-brown") %>%
  ggplot(aes(x=resid.sg.mean, y=resid.delta.mean)) +
    geom_errorbar(aes(xmin=resid.sg.mean - resid.sg.sem,
                      xmax=resid.sg.mean + resid.sg.sem,
                      ymin=resid.delta.mean - resid.delta.sem,
                      ymax=resid.delta.mean + resid.delta.sem), alpha=0.3) +
    geom_smooth(method="lm", se=T) +
    geom_point(stat="identity", position="dodge", alpha=1, size=4, aes(shape=model, color=training_vocab)) +
    ylab(paste("Residual", metric)) +
    xlab("Residual Syntax Generalization Score") +
    ggtitle("Syntactic Generalization vs. Predictive Power") +
    scale_color_manual(values = c("bllip-lg"="#440154FF",
                                  "bllip-md"="#39568CFF",
                                  "bllip-sm"="#1F968BFF",
                                  "bllip-xs"="#73D055FF",
                                  "gptbpe"="#888888")) +
    facet_grid(.~corpus, scales="free") +
    theme(axis.text=element_text(size=14),
          strip.text.x = element_text(size=14),
          legend.text=element_text(size=14),
          axis.title=element_text(size=18),
          legend.position = "right")
Ignoring unknown aesthetics: xmin, xmax
ggsave("../images/cuny2020/ppl_sg.png",height=4.5,width=11)

do_stepwise_regression = function(cur_corpus) {
  regression_data = model_deltas %>%
    filter(corpus == cur_corpus)
  
  print("----------------------")
  print(cur_corpus)
  
  lm1 = lm(delta_test_mean ~ training_vocab:test_ppl, data = regression_data)
  lm2 = lm(delta_test_mean ~ training_vocab:test_ppl + sg_score, data = regression_data)
  print(anova(lm1, lm2))
  summary(lm2)
}
#do_stepwise_regression("bnc-brown")
do_stepwise_regression("dundee")
[1] "----------------------"
[1] "dundee"
Analysis of Variance Table

Model 1: delta_test_mean ~ training_vocab:test_ppl
Model 2: delta_test_mean ~ training_vocab:test_ppl + sg_score
  Res.Df        RSS Df  Sum of Sq      F Pr(>F)
1     23 0.00037542                            
2     22 0.00037301  1 2.4117e-06 0.1422 0.7097

Call:
lm(formula = delta_test_mean ~ training_vocab:test_ppl + sg_score, 
    data = regression_data)

Residuals:
      Min        1Q    Median        3Q       Max 
-0.003573 -0.002545 -0.001998  0.002783  0.007007 

Coefficients:
                                  Estimate Std. Error t value Pr(>|t|)  
(Intercept)                      9.497e-03  4.523e-03   2.100   0.0474 *
sg_score                         2.429e-03  6.440e-03   0.377   0.7097  
training_vocabbllip-lg:test_ppl -5.322e-05  4.190e-05  -1.270   0.2174  
training_vocabbllip-md:test_ppl -6.608e-05  3.492e-05  -1.892   0.0717 .
training_vocabbllip-sm:test_ppl -6.472e-05  3.110e-05  -2.081   0.0493 *
training_vocabbllip-xs:test_ppl -5.211e-05  2.075e-05  -2.512   0.0199 *
training_vocabgptbpe:test_ppl    2.816e-05  1.019e-05   2.762   0.0114 *
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

Residual standard error: 0.004118 on 22 degrees of freedom
Multiple R-squared:  0.6547,    Adjusted R-squared:  0.5605 
F-statistic: 6.951 on 6 and 22 DF,  p-value: 0.000304
do_stepwise_regression("natural-stories")
[1] "----------------------"
[1] "natural-stories"
Analysis of Variance Table

Model 1: delta_test_mean ~ training_vocab:test_ppl
Model 2: delta_test_mean ~ training_vocab:test_ppl + sg_score
  Res.Df        RSS Df  Sum of Sq      F Pr(>F)
1     23 1.0694e-04                            
2     22 9.7417e-05  1 9.5188e-06 2.1497 0.1567

Call:
lm(formula = delta_test_mean ~ training_vocab:test_ppl + sg_score, 
    data = regression_data)

Residuals:
       Min         1Q     Median         3Q        Max 
-0.0028202 -0.0014519 -0.0002531  0.0012548  0.0040795 

Coefficients:
                                  Estimate Std. Error t value Pr(>|t|)    
(Intercept)                      8.349e-03  2.311e-03   3.612 0.001546 ** 
sg_score                         4.826e-03  3.291e-03   1.466 0.156749    
training_vocabbllip-lg:test_ppl -3.997e-05  2.141e-05  -1.866 0.075363 .  
training_vocabbllip-md:test_ppl -5.271e-05  1.785e-05  -2.953 0.007344 ** 
training_vocabbllip-sm:test_ppl -5.135e-05  1.589e-05  -3.231 0.003841 ** 
training_vocabbllip-xs:test_ppl -4.159e-05  1.060e-05  -3.922 0.000728 ***
training_vocabgptbpe:test_ppl   -1.516e-06  5.210e-06  -0.291 0.773803    
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

Residual standard error: 0.002104 on 22 degrees of freedom
Multiple R-squared:  0.6844,    Adjusted R-squared:  0.5984 
F-statistic: 7.952 on 6 and 22 DF,  p-value: 0.0001219

Predictive power and perplexity

model_deltas %>%
  ggplot(aes(x=test_ppl, y=delta_test_mean, color=training_vocab)) +
    geom_errorbar(aes(ymin=delta_test_mean-delta_test_sem, ymax=delta_test_mean+delta_test_sem), alpha=0.4) +
    #geom_smooth(method="lm", se=F) +
    geom_point(stat="identity", position="dodge", alpha=1, size=4, aes(shape=model)) +
    ylab(metric) +
    xlab("Test Perplexity") +
    #coord_cartesian(ylim = c(1, 16)) +
    ggtitle("Test Perplexity vs. Predictive Power") +
    scale_color_manual(values = c("bllip-lg"="#440154FF",
                                  "bllip-md"="#39568CFF",
                                  "bllip-sm"="#1F968BFF",
                                  "bllip-xs"="#73D055FF",
                                  "gptbpe"="#888888")) +
    facet_grid(~corpus, scales="free") +
    #coord_cartesian(ylim = c(0, 150)) +
    theme(axis.text=element_text(size=12),
          strip.text.x = element_text(size=12),
          legend.text=element_text(size=12),
          axis.title=element_text(size=12),
          legend.position = "right")
ggsave("../images/cuny2020/ppl_loglik.png",height=4.5,width=11)

model_deltas %>%
  #filter(model != "5gram", training != "bllip-lg") %>%
  group_by(model, corpus) %>%
    #summarise(n = n())
    summarise(corr = as.numeric(cor.test(delta_test_mean, test_ppl)[4]),
              pval = as.numeric(cor.test(delta_test_mean, test_ppl)[3]))

Effect of training data size

model_deltas %>%
  mutate(train_size = log(train_size)) %>%
  ggplot(aes(x=train_size, y=delta_test_mean, color=model)) +
    geom_errorbar(aes(ymin=delta_test_mean-delta_test_sem, ymax=delta_test_mean+delta_test_sem), width = 0.1) +
    geom_smooth(method="lm", se=T, alpha=0.5) +
    geom_point(stat="identity", position="dodge", alpha=1, size=3) +
    ylab(metric) +
    xlab("Log Million Training Tokens") +
    ggtitle("Training Size vs. Predictive Power") +
    facet_grid(corpus~model, scales="free") +
    #scale_color_manual(values = c("#A42EF1", "#3894C8")) +
    theme(axis.text=element_text(size=14),
          strip.text.x = element_text(size=14),
          legend.text=element_text(size=14),
          axis.title=element_text(size=18),
          legend.position = "bottom")

#ggsave("./cogsci_images/training_loglik.png",height=5,width=6)
model_deltas %>%
  mutate(train_size = log(train_size)) %>%
  ggplot(aes(x=train_size, y=sg_score, color=model)) +
    geom_smooth(method="lm", se=T, alpha=0.5) +
    geom_point(stat="identity", position="dodge", alpha=1, size=3) +
    ylab("SG SCore") +
    xlab("Log Million Training Tokens") +
    ggtitle("Training Size vs. Syntactic Generalization") +
    #scale_color_manual(values = c("#A42EF1", "#3894C8")) +
    facet_grid(~model, scales="free") +
    theme(axis.text=element_text(size=14),
          strip.text.x = element_text(size=14),
          legend.text=element_text(size=14),
          axis.title=element_text(size=18),
          legend.position = "bottom")

#ggsave("./cogsci_images/training_sg.png",height=5,width=6)

Smith & Levy reproduction

  
all_data %>%
  filter(surprisal < 15, surprisal > 0) %>%
  ggplot(aes(x=surprisal, y=psychometric, color=training)) +
    stat_smooth(se=T, alpha=0.5) +
    #geom_errorbar(color="black", width=.2, position=position_dodge(width=.9), alpha=0.3) +
    #geom_point(stat="identity", position="dodge", alpha=1, size=3) +
    ylab("Processing Time (ms)") +
    xlab("Surprisal (bits)") +
    ggtitle("Surprisal vs. Reading Time / Gaze Duration") +
    facet_grid(corpus~model, scales = "free") +
    scale_color_manual(values = c("bllip-lg"="#440154FF",
                              "bllip-md"="#39568CFF",
                              "bllip-sm"="#1F968BFF",
                              "bllip-xs"="#73D055FF",
                              "bllip-lg-gptbpe"="#888888",
                              "bllip-md-gptbpe"="#888888",
                              "bllip-sm-gptbpe"="#888888",
                              "bllip-xs-gptbpe"="#888888")) +
    theme(axis.text=element_text(size=14),
          axis.text.y = element_text(size = 10),
          strip.text.x = element_text(size=14),
          legend.text=element_text(size=14),
          axis.title=element_text(size=18),
          legend.position = "right")
ggsave("../images/cuny2020/surp_corr.png",height=4.5,width=12)

LS0tCnRpdGxlOiAiQ1VOWSAyMDIwIEFuYWx5c2lzIgpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sKLS0tCgojIFBhY2thZ2VzIGFuZCB1dGlsaXRpZXMKCmBgYHtyfQpsaWJyYXJ5KHRpZHl2ZXJzZSkKbGlicmFyeShsbWU0KQpsaWJyYXJ5KGxtZXJUZXN0KQpsaWJyYXJ5KHBsb3RyaXgpCmxpYnJhcnkoc3RyaW5ncikKbGlicmFyeShyZWFkeGwpCmxpYnJhcnkoUkNvbG9yQnJld2VyKQpsaWJyYXJ5KG12dG5vcm0pCmxpYnJhcnkobWdjdikKYGBgCgpgYGB7cn0KIyBDb21wdXRlIHRoZSBsb2ctbGlrZWxpaG9vZCBvZiBhIG5ldyBkYXRhc2V0IHVzaW5nIGEgZml0IGxtZTQgbW9kZWwuCmxvZ0xpa190ZXN0IDwtIGZ1bmN0aW9uKGxtLCB0ZXN0X1gsIHRlc3RfeSkgewogIHByZWRpY3Rpb25zIDwtIHByZWRpY3QobG0sIHRlc3RfWCwgcmUuZm9ybT1OQSkKICAjIEdldCBzdGQuZGV2LiBvZiByZXNpZHVhbCwgZXN0aW1hdGVkIGZyb20gdHJhaW4gZGF0YQogIHN0ZGV2IDwtIHNpZ21hKGxtKQogICMgRm9yIGVhY2ggcHJlZGljdGlvbi0tb2JzZXJ2YXRpb24sIGdldCB0aGUgZGVuc2l0eSBwKG9icyB8IE4ocHJlZGljdGVkLCBtb2RlbF9zaWdtYSkpIGFuZCByZWR1Y2UKICBkZW5zaXR5IDwtIHN1bShkbm9ybSh0ZXN0X3ksIHByZWRpY3Rpb25zLCBzdGRldiwgbG9nPVRSVUUpKQogIHJldHVybihkZW5zaXR5KQp9CiMgR2V0IHBlci1wcmVkaWN0aW9uIGxvZy1saWtlbGlob29kCmxvZ0xpa190ZXN0X3BlciA8LSBmdW5jdGlvbihsbSwgdGVzdF9YLCB0ZXN0X3kpIHsKICBwcmVkaWN0aW9ucyA8LSBwcmVkaWN0KGxtLCB0ZXN0X1gsIHJlLmZvcm09TkEpCiAgIyBHZXQgc3RkLmRldi4gb2YgcmVzaWR1YWwsIGVzdGltYXRlZCBmcm9tIHRyYWluIGRhdGEKICBzdGRldiA8LSBzaWdtYShsbSkKICAjIEZvciBlYWNoIHByZWRpY3Rpb24tLW9ic2VydmF0aW9uLCBnZXQgdGhlIGRlbnNpdHkgcChvYnMgfCBOKHByZWRpY3RlZCwgbW9kZWxfc2lnbWEpKQogIGRlbnNpdGllcyA8LSBkbm9ybSh0ZXN0X3ksIHByZWRpY3Rpb25zLCBzdGRldiwgbG9nPVRSVUUpCiAgcmV0dXJuKGRlbnNpdGllcykKfQojIENvbXB1dGUgTVNFIG9mIGEgbmV3IGRhdGFzZXQgdXNpbmcgYSBmaXQgbG1lNCBtb2RlbC4KbXNlX3Rlc3QgPC0gZnVuY3Rpb24obG0sIHRlc3RfWCwgdGVzdF95KSB7CiAgcmV0dXJuKG1lYW4oKHByZWRpY3QobG0sIHRlc3RfWCwgcmUuZm9ybT1OQSkgLSB0ZXN0X3kpIF4gMikpCn0KI1Nhbml0eSBjaGVja3MKI215bG0gPC0gZ2FtKHBzeWNob21ldHJpYyB+ICBzKHN1cnByaXNhbCwgYnMgPSAiY3IiLCBrID0gMjApICsgcyhwcmV2X3N1cnAsIGJzID0gImNyIiwgayA9IDIwKSArIHRlKGZyZXEsIGxlbiwgYnMgPSAiY3IiKSArIHRlKHByZXZfZnJlcSwgcHJldl9sZW4sIGJzID0gImNyIiksIGRhdGE9dHJhaW5fZGF0YSkKI2MobG9nTGlrKG15bG0pLCBsb2dMaWtfdGVzdChteWxtLCB0cmFpbl9kYXRhLCB0cmFpbl9kYXRhJHBzeWNob21ldHJpYykpCiNsb2dMaWtfdGVzdChteWxtLCB0ZXN0X2RhdGEsIHRlc3RfZGF0YSRwc3ljaG9tZXRyaWMpCmBgYAoKIyBEYXRhIGxvYWRpbmcgYW5kIHByZXByb2Nlc3NpbmcKCmBgYHtyfQpkYXRhID0gcmVhZC5jc3YoIi4uL2RhdGEvaGFybW9uaXplZF9yZXN1bHRzLmNzdiIpCgphbGxfZGF0YSA9IGRhdGEgJT4lCiAgbXV0YXRlKHNlZWQgPSBhcy5mYWN0b3Ioc2VlZCkpICU+JQogIGdyb3VwX2J5KGNvcnB1cywgbW9kZWwsIHRyYWluaW5nLCBzZWVkKSAlPiUKICAgIG11dGF0ZShwcmV2X3N1cnAgPSBsYWcoc3VycHJpc2FsKSwKICAgICAgICAgcHJldl9jb2RlID0gbGFnKGNvZGUpLAogICAgICAgICBwcmV2X2xlbiA9IGxhZyhsZW4pLAogICAgICAgICBwcmV2X2ZyZXEgPSBsYWcoZnJlcSksCiAgICAgICAgIHByZXZfc3VycCA9IGxhZyhzdXJwcmlzYWwpLAogICAgICAgICAKICAgICAgICAgcHJldjJfZnJlcSA9IGxhZyhwcmV2X2ZyZXEpLAogICAgICAgICBwcmV2Ml9jb2RlID0gbGFnKHByZXZfY29kZSksCiAgICAgICAgIHByZXYyX2xlbiA9IGxhZyhwcmV2X2xlbiksCiAgICAgICAgIHByZXYyX3N1cnAgPSBsYWcocHJldl9zdXJwKSwKICAgICAgICAgCiAgICAgICAgIHByZXYzX2ZyZXEgPSBsYWcocHJldjJfZnJlcSksCiAgICAgICAgIHByZXYzX2NvZGUgPSBsYWcocHJldjJfY29kZSksCiAgICAgICAgIHByZXYzX2xlbiA9IGxhZyhwcmV2Ml9sZW4pLAogICAgICAgICBwcmV2M19zdXJwID0gbGFnKHByZXYyX3N1cnApKSAlPiUKICB1bmdyb3VwKCkgJT4lCiAgIyBGaWx0ZXIgYmFjayB0aHJlZSBmb3IgdGhlIGR1bmRlZSBjb3JwdXMuIEZpbHRlciBiYWNrIDEgZm9yIGFsbCBvdGhlciBjb3Jwb3JhCiAgZmlsdGVyKChjb3JwdXMgPT0gImR1bmRlZSIgJiBjb2RlID09IHByZXYyX2NvZGUgKyAyKSB8IChjb3JwdXMgIT0gImR1bmRlZSIgJiBjb2RlID09IHByZXZfY29kZSArIDEpKSAlPiUKICBzZWxlY3QoLXByZXZfY29kZSwgLXByZXYyX2NvZGUsIC1wcmV2M19jb2RlKSAlPiUKICBkcm9wX25hKCkKCmFsbF9kYXRhID0gYWxsX2RhdGEgJT4lCiAgbXV0YXRlKAogICAgbW9kZWwgPSBhcy5jaGFyYWN0ZXIobW9kZWwpLAogICAgbW9kZWwgPSBpZl9lbHNlKG1vZGVsID09ICJncHQtMiIsICJncHQyIiwgbW9kZWwpLAogICAgbW9kZWwgPSBhcy5mYWN0b3IobW9kZWwpKQpgYGAKCgogCmBgYHtyfQojIENvbXB1dGUgbGluZWFyIG1vZGVsIHN0YXRzIGZvciB0aGUgZ2l2ZW4gdHJhaW5pbmcgZGF0YSBzdWJzZXQgYW5kIGZ1bGwgdGVzdCBkYXRhLgojIEF1dG9tYXRpY2FsbHkgc3Vic2V0cyB0aGUgdGVzdCBkYXRhIHRvIG1hdGNoIHRoZSByZWxldmFudCBncm91cCBmb3Igd2hpY2ggd2UgYXJlIHRyYWluaW5nIGEgbGluZWFyIG1vZGVsLgpnZXRfbG1fZGF0YSA8LSBmdW5jdGlvbihkZiwgdGVzdF9kYXRhLCBmb3JtdWxhLCBmb2xkLCBzdG9yZV9lbnYpIHsKICAjdGhpc19sbSA8LSBnYW0oZm9ybXVsYSwgZGF0YT1kZik7CiAgdGhpc19sbSA9IGxtKGZvcm11bGEsIGRhdGE9ZGYpCiAgdGhpc190ZXN0X2RhdGEgPC0gc2VtaV9qb2luKHRlc3RfZGF0YSwgZGYsIGJ5PWMoInRyYWluaW5nIiwgIm1vZGVsIiwgInNlZWQiLCAiY29ycHVzIikpOwogIAogICMgU2F2ZSBsbSB0byB0aGUgZ2xvYmFsIGVudiBzbyB0aGF0IHdlIGNhbiBhY2Nlc3MgcmVzaWR1YWxzIGxhdGVyLgogIGxtX25hbWUgPSBwYXN0ZSh1bmlxdWUocGFzdGUoZGYkbW9kZWwsIGRmJHRyYWluaW5nLCBkZiRzZWVkLCBkZiRjb3JwdXMpKVsxXSwgZm9sZCkKICBhc3NpZ24obG1fbmFtZSwgdGhpc19sbSwgZW52aXI9c3RvcmVfZW52KQogIAogIHN1bW1hcmlzZShkZiwKICAgICAgICAgICAgbG9nX2xpayA9IGFzLm51bWVyaWMobG9nTGlrKHRoaXNfbG0sIFJFTUwgPSBGKSksCiAgICAgICAgICAgIHRlc3RfbGlrID0gbG9nTGlrX3Rlc3QodGhpc19sbSwgdGhpc190ZXN0X2RhdGEsIHRoaXNfdGVzdF9kYXRhJHBzeWNob21ldHJpYyksCiAgICAgICAgICAgIHRlc3RfbXNlID0gbXNlX3Rlc3QodGhpc19sbSwgdGhpc190ZXN0X2RhdGEsIHRoaXNfdGVzdF9kYXRhJHBzeWNob21ldHJpYykpCn0KIyBGb3IgYSBwcmV2aW91c2x5IGZpdHRlZCBsbSBzdG9yZWQgaW4gc3RvcmVfZW52LCBnZXQgdGhlIHJlc2lkdWFscyBvbiB0ZXN0IGRhdGEgb2YgdGhlIHJlbGV2YW50IGRhdGEgc3Vic2V0LgpnZXRfbG1fcmVzaWR1YWxzIDwtIGZ1bmN0aW9uKGRmLCBmb2xkLCBzdG9yZV9lbnYpIHsKICAjIFJldHJpZXZlIHRoZSByZWxldmFudCBsbS4KICBsbV9uYW1lID0gcGFzdGUodW5pcXVlKHBhc3RlKGRmJG1vZGVsLCBkZiR0cmFpbmluZywgZGYkc2VlZCwgZGYkY29ycHVzKSlbMV0sIGZvbGQpCiAgdGhpc19sbSA8LSBnZXQobG1fbmFtZSwgZW52aXI9c3RvcmVfZW52KQogIAogIG11dGF0ZShkZiwKICAgICAgICAgbGlrZWxpaG9vZCA9IGxvZ0xpa190ZXN0X3Blcih0aGlzX2xtLCBkZiwgZGYkcHN5Y2hvbWV0cmljKSwKICAgICAgICAgcmVzaWQgPSBkZiRwc3ljaG9tZXRyaWMgLSBwcmVkaWN0KHRoaXNfbG0sIGRmLCByZS5mb3JtPU5BKSkKfQojIENvbXB1dGUgcGVyLWV4YW1wbGUgZGVsdGEtbG9nLWxpa2VsaWhvb2QgZm9yIHRoZSBnaXZlbiB0ZXN0IGZvbGQuCmdldF9sbV9kZWx0YV9sb2dfbGlrIDwtIGZ1bmN0aW9uKHRlc3RfZGF0YSwgZm9sZCwgYmFzZWxpbmVfZW52LCBmdWxsX2VudikgewogIGxtX25hbWUgPSBwYXN0ZSh1bmlxdWUocGFzdGUodGVzdF9kYXRhJG1vZGVsLCB0ZXN0X2RhdGEkdHJhaW5pbmcsIHRlc3RfZGF0YSRzZWVkLCB0ZXN0X2RhdGEkY29ycHVzKSlbMV0sIGZvbGQpCiAgYmFzZWxpbmVfbG0gPC0gZ2V0KGxtX25hbWUsIGVudmlyPWJhc2VsaW5lX2VudikKICBmdWxsX2xtIDwtIGdldChsbV9uYW1lLCBlbnZpcj1mdWxsX2VudikKICAKICBkZWx0YV9sb2dfbGlrID0gbG9nTGlrX3Rlc3RfcGVyKGZ1bGxfbG0sIHRlc3RfZGF0YSwgdGVzdF9kYXRhJHBzeWNob21ldHJpYykgLSBsb2dMaWtfdGVzdF9wZXIoYmFzZWxpbmVfbG0sIHRlc3RfZGF0YSwgdGVzdF9kYXRhJHBzeWNob21ldHJpYykKICByZXR1cm4oY2JpbmQodGVzdF9kYXRhLCBkZWx0YV9sb2dfbGlrPWRlbHRhX2xvZ19saWspKQp9CiMjIyMjCiMgRGVmaW5lIHJlZ3Jlc3Npb24gZm9ybXVsYWUuCiMgRXllLXRyYWNraW5nIHJlZ3Jlc3Npb246IG9ubHkgdXNlIHN1cnByaXNhbCBhbmQgcHJldmlvdXMgc3VycHJpc2FsOyBTUFJUIHJlZ3Jlc3Npb246IHVzZSAyLWJhY2sgZmVhdHVyZXMuCiNiYXNlbGluZV9ydF9yZWdyZXNzaW9uID0gcHN5Y2hvbWV0cmljIH4gdGUoZnJlcSwgbGVuLCBicyA9ICJjciIpICsgdGUocHJldl9mcmVxLCBwcmV2X2xlbiwgYnMgPSAiY3IiKQojYmFzZWxpZV9zcHJ0X3JlZ3Jlc3Npb24gPSBwc3ljaG9tZXRyaWMgfiB0ZShmcmVxLCBsZW4sIGJzID0gImNyIikgKyB0ZShwcmV2X2ZyZXEsIHByZXZfbGVuLCBicyA9ICJjciIpICsgdGUocHJldjJfZnJlcSwgcHJldjJfbGVuLCBicyA9ICJjciIpCiNmdWxsX3J0X3JlZ3Jlc3Npb24gPSAocHN5Y2hvbWV0cmljIH4gcyhzdXJwcmlzYWwsIGJzID0gImNyIiwgayA9IDIwKSArIHMocHJldl9zdXJwLCBicyA9ICJjciIsIGsgPSAyMCkKICAgICAgICAgICAgICAgICAgICAgIysgdGUoZnJlcSwgbGVuLCBicyA9ICJjciIpICsgdGUocHJldl9mcmVxLCBwcmV2X2xlbiwgYnMgPSAiY3IiKSkKI2Z1bGxfc3BydF9yZWdyZXNzaW9uID0gKHBzeWNob21ldHJpYyB+IHMoc3VycHJpc2FsLCBicyA9ICJjciIsIGsgPSAyMCkgKyBzKHByZXZfc3VycCwgYnMgPSAiY3IiLCBrID0gMjApICsgcyhwcmV2Ml9zdXJwLCBicyA9ICJjciIsIGsgPSAyMCkKICAgICAgICAgICAgICAgICAgICAgICAgIysgdGUoZnJlcSwgbGVuLCBicyA9ICJjciIpICsgdGUocHJldl9mcmVxLCBwcmV2X2xlbiwgYnMgPSAiY3IiKSArIHRlKHByZXYyX2ZyZXEsIHByZXYyX2xlbiwgYnMgPSAiY3IiKSkKCmJhc2VsaW5lX3J0X3JlZ3Jlc3Npb24gPSBwc3ljaG9tZXRyaWMgfiBmcmVxICsgcHJldl9mcmVxICsgcHJldjJfZnJlcSArIHByZXYzX2ZyZXEgKyBsZW4gKyBwcmV2X2xlbiArIHByZXYyX2xlbiArIHByZXYzX2xlbgpiYXNlbGluZV9zcHJ0X3JlZ3Jlc3Npb24gPSBwc3ljaG9tZXRyaWMgfiBmcmVxICsgcHJldl9mcmVxICsgbGVuICsgcHJldl9sZW4KCmZ1bGxfcnRfcmVncmVzc2lvbiA9IHBzeWNob21ldHJpYyB+IHN1cnByaXNhbCArIHByZXZfc3VycCArIHByZXYyX3N1cnAgKyBwcmV2M19zdXJwICsgZnJlcSArIHByZXZfZnJlcSArIHByZXYyX2ZyZXEgKyBwcmV2M19mcmVxICsgbGVuICsgcHJldl9sZW4gKyBwcmV2Ml9sZW4gKyBwcmV2M19sZW4KZnVsbF9zcHJ0X3JlZ3Jlc3Npb24gPSBwc3ljaG9tZXRyaWMgfiBzdXJwcmlzYWwgKyBwcmV2X3N1cnAgKyBmcmVxICsgcHJldl9mcmVxICsgbGVuICsgcHJldl9sZW4KICAKIyMjIyMKIyBQcmVwYXJlIGZyYW1lcy9lbnZpcm9ubWVudHMgZm9yIHN0b3JpbmcgcmVzdWx0cy9vYmplY3RzLgpiYXNlbGluZV9yZXN1bHRzID0gZGF0YS5mcmFtZSgpCmZ1bGxfbW9kZWxfcmVzdWx0cyA9IGRhdGEuZnJhbWUoKQojYmFzZWxpbmVfcmVzaWR1YWxzID0gZGF0YS5mcmFtZSgpCiNmdWxsX3Jlc2lkdWFscyA9IGRhdGEuZnJhbWUoKQpsb2dfbGlrX2RlbHRhcyA9IGRhdGEuZnJhbWUoKQoKI1JhbmRvbWx5IHNodWZmbGUgdGhlIGRhdGEKYWxsX2RhdGE8LWFsbF9kYXRhW3NhbXBsZShucm93KGFsbF9kYXRhKSksXQojQ3JlYXRlIEsgZXF1YWxseSBzaXplIGZvbGRzCksgPSA1CmZvbGRzIDwtIGN1dChzZXEoMSxucm93KGFsbF9kYXRhKSksYnJlYWtzPUssbGFiZWxzPUZBTFNFKQojUGVyZm9ybSAxMCBmb2xkIGNyb3NzIHZhbGlkYXRpb24KCiMgRml0IG1vZGVscyBmb3Igc29tZSBmb2xkIG9mIHRoZSBkYXRhLgpiYXNlbGluZV9jb3JwdXMgPSBmdW5jdGlvbihjb3JwdXMsIGRmLCB0ZXN0X2RhdGEsIGZvbGQsIGVudikgewogIGlmKGNvcnB1cyA9PSAiZHVuZGVlIikgewogICAgZ2V0X2xtX2RhdGEoZGYsIHRlc3RfZGF0YSwgYmFzZWxpbmVfcnRfcmVncmVzc2lvbiwgZm9sZCwgZW52KQogIH0gZWxzZSB7CiAgICBnZXRfbG1fZGF0YShkZiwgdGVzdF9kYXRhLCBiYXNlbGluZV9zcHJ0X3JlZ3Jlc3Npb24sIGZvbGQsIGVudikKICB9Cn0KZnVsbF9tb2RlbF9jb3JwdXMgPSBmdW5jdGlvbihjb3JwdXMsIGRmLCB0ZXN0X2RhdGEsIGZvbGQsIGVudikgewogIGlmKGNvcnB1c1sxXSA9PSAiZHVuZGVlIikgewogICAgZ2V0X2xtX2RhdGEoZGYsIHRlc3RfZGF0YSwgZnVsbF9ydF9yZWdyZXNzaW9uLCBmb2xkLCBlbnYpCiAgfSBlbHNlIHsKICAgIGdldF9sbV9kYXRhKGRmLCB0ZXN0X2RhdGEsIGZ1bGxfc3BydF9yZWdyZXNzaW9uLCBmb2xkLCBlbnYpCiAgfQp9CgojIFByZXBhcmUgYSBuZXcgRW52aXJvbm1lbnQgaW4gd2hpY2ggd2Ugc3RvcmUgZml0dGVkIExNcywgd2hpY2ggd2UnbGwgcXVlcnkgbGF0ZXIgZm9yIHJlc2lkdWFscyBhbmQgb3RoZXIgbWV0cmljcy4KYmFzZWxpbmVfZW52ID0gbmV3LmVudigpCmZ1bGxfZW52ID0gbmV3LmVudigpCgpmb3IoaSBpbiAxOkspIHsgCiAgI1NlZ2VtZW50IHlvdXIgZGF0YSBieSBmb2xkIHVzaW5nIHRoZSB3aGljaCgpIGZ1bmN0aW9uIAogIHRlc3RJbmRleGVzIDwtIHdoaWNoKGZvbGRzPT1pLCBhcnIuaW5kPVRSVUUpCiAgdGVzdF9kYXRhIDwtIGFsbF9kYXRhW3Rlc3RJbmRleGVzLCBdCiAgdHJhaW5fZGF0YSA8LSBhbGxfZGF0YVstdGVzdEluZGV4ZXMsIF0KICAKICAjIENvbXB1dGUgYSBiYXNlbGluZSBsaW5lYXIgbW9kZWwgZm9yIGVhY2ggbW9kZWwtLXRyYWluaW5nLS1zZWVkLS1SVC1jb3JwdXMgY29tYmluYXRpb24uCiAgYmFzZWxpbmVzID0gdHJhaW5fZGF0YSAlPiUKICAgIGdyb3VwX2J5KG1vZGVsLCB0cmFpbmluZywgc2VlZCwgY29ycHVzKSAlPiUKICAgICAgcHJpbnQobW9kZWwpICU+JQogICAgICBkbyhiYXNlbGluZV9jb3JwdXModW5pcXVlKC4kY29ycHVzKSwgLiwgdGVzdF9kYXRhLCBpLCBiYXNlbGluZV9lbnYpKSAlPiUKICAgIHVuZ3JvdXAoKSAlPiUKICAgIG11dGF0ZShzZWVkID0gYXMuZmFjdG9yKHNlZWQpLAogICAgICAgICAgIGZvbGQgPSBpKQogIAogIGJhc2VsaW5lX3Jlc3VsdHMgPSByYmluZChiYXNlbGluZV9yZXN1bHRzLCBiYXNlbGluZXMpCiAgCiAgIyBDb21wdXRlIGEgZnVsbCBsaW5lYXIgbW9kZWwgZm9yIGVhY2ggbW9kZWwtLXRyYWluaW5nLS1zZWVkLVJULWNvcnB1cyBjb21iaW5hdGlvbgogIGZ1bGxfbW9kZWxzID0gdHJhaW5fZGF0YSAlPiUKICAgIGdyb3VwX2J5KG1vZGVsLCB0cmFpbmluZywgc2VlZCwgY29ycHVzKSAlPiUKICAgICAgZG8oZnVsbF9tb2RlbF9jb3JwdXModW5pcXVlKC4kY29ycHVzKSwgLiwgdGVzdF9kYXRhLCBpLCBmdWxsX2VudikpICU+JQogICAgdW5ncm91cCgpICU+JQogICAgbXV0YXRlKHNlZWQgPSBhcy5mYWN0b3Ioc2VlZCksCiAgICAgICAgICAgZm9sZCA9IGkpCiAgCiAgZnVsbF9tb2RlbF9yZXN1bHRzID0gcmJpbmQoZnVsbF9tb2RlbF9yZXN1bHRzLCBmdWxsX21vZGVscykKICAKICAjIENvbXB1dGUgZGVsdGEtbG9nLWxpa2VsaWhvb2RzCiAgZm9sZF9sb2dfbGlrX2RlbHRhcyA9IHRlc3RfZGF0YSAlPiUKICAgIGdyb3VwX2J5KG1vZGVsLCB0cmFpbmluZywgc2VlZCwgY29ycHVzKSAlPiUKICAgICAgZG8oZ2V0X2xtX2RlbHRhX2xvZ19saWsoLiwgaSwgYmFzZWxpbmVfZW52LCBmdWxsX2VudikpICU+JQogICAgdW5ncm91cCgpCgogIGxvZ19saWtfZGVsdGFzID0gcmJpbmQobG9nX2xpa19kZWx0YXMsIGZvbGRfbG9nX2xpa19kZWx0YXMpCiAgCiAgIyBmb2xkX2Jhc2VsaW5lX3Jlc2lkdWFscyA9IHRlc3RfZGF0YSAlPiUKICAjICAgZ3JvdXBfYnkobW9kZWwsIHRyYWluaW5nLCBzZWVkLCBjb3JwdXMpICU+JQogICMgICAgIGRvKGdldF9sbV9yZXNpZHVhbHMoLiwgaSwgYmFzZWxpbmVfZW52KSkgJT4lCiAgIyAgIHVuZ3JvdXAoKQogICMgCiAgIyBiYXNlbGluZV9yZXNpZHVhbHMgPSByYmluZChiYXNlbGluZV9yZXNpZHVhbHMsIGZvbGRfYmFzZWxpbmVfcmVzaWR1YWxzKQogICMgCiAgIyBmb2xkX2Z1bGxfcmVzaWR1YWxzID0gdGVzdF9kYXRhICU+JQogICMgICBncm91cF9ieShtb2RlbCwgdHJhaW5pbmcsIHNlZWQsIGNvcnB1cykgJT4lCiAgIyAgICAgZG8oZ2V0X2xtX3Jlc2lkdWFscyguLCBpLCBmdWxsX2VudikpICU+JQogICMgICB1bmdyb3VwKCkgCiAgIyAKICAjIGZ1bGxfcmVzaWR1YWxzID0gcmJpbmQoZnVsbF9yZXNpZHVhbHMsIGZvbGRfZnVsbF9yZXNpZHVhbHMpCn0KYGBgCgpgYGB7cn0KI3dyaXRlLmNzdihmdWxsX3Jlc2lkdWFscywgIi4uL2RhdGEvYW5hbHlzaXNfY2hlY2twb2ludHMvZnVsbF9yZXNpZHVhbHMuY3N2IikKI3dyaXRlLmNzdihiYXNlbGluZV9yZXNpZHVhbHMsICIuLi9kYXRhL2FuYWx5c2lzX2NoZWNrcG9pbnRzL2Jhc2VsaW5lX3Jlc2lkdWFscy5jc3YiKQpgYGAKCmBgYHtyfQptb2RlbF9kZWx0YXMgPSBsb2dfbGlrX2RlbHRhcyAlPiUKICBncm91cF9ieShtb2RlbCwgdHJhaW5pbmcsIHNlZWQsIGNvcnB1cykgJT4lIAogIHN1bW1hcmlzZShtZWFuX2RlbHRhX2xvZ19saWsgPSBtZWFuKGRlbHRhX2xvZ19saWspLAogICAgICAgICAgICBzZW1fZGVsdGFfbG9nX2xpayA9IHNkKGRlbHRhX2xvZ19saWspIC8gc3FydChsZW5ndGgoZGVsdGFfbG9nX2xpaykpKQpgYGAKCmBgYHtyfQp3cml0ZS5jc3YoZnVsbF9tb2RlbF9yZXN1bHRzLCAiLi4vZGF0YS9hbmFseXNpc19jaGVja3BvaW50cy9mdWxsX21vZGVsX3Jlc3VsdC5jc3YiKQp3cml0ZS5jc3YoYmFzZWxpbmVfcmVzdWx0cywgIi4uL2RhdGEvYW5hbHlzaXNfY2hlY2twb2ludHMvYmFzZWxpbmVfcmVzdWx0cy5jc3YiKQojZnVsbF9tb2RlbF9yZXN1bHRzID0gcmVhZC5jc3YoIi4uL2RhdGEvYW5hbHlzaXNfY2hlY2twb2ludHMvZmZ1bGxfbW9kZWxfcmVzdWx0cy5jc3YiKQojYmFzZWxpbmVfcmVzdWx0cyA9IHJlYWQuY3N2KCIuLi9kYXRhL2FuYWx5c2lzX2NoZWNrcG9pbnRzL2ZiYXNlbGluZV9yZXN1bHRzYi5jc3YiKQpgYGAKCmBgYHtyfQptZXRyaWMgPC0gIs6UTG9nTGlrIgojbWV0cmljIDwtICItzpRNU0UiCgojICMgU2VsZWN0IHRoZSByZWxldmFudCBtZXRyaWMuCm1vZGVsX2RlbHRhcyA9IG1vZGVsX2RlbHRhcyAlPiUKICAgICMgUmV0cmlldmUgdGhlIGN1cnJlbnQgdGVzdCBtZXRyaWMKICAgIG11dGF0ZShkZWx0YV90ZXN0X21lYW4gPSBtZWFuX2RlbHRhX2xvZ19saWssCiAgICAgICAgICAgZGVsdGFfdGVzdF9zZW0gPSBzZW1fZGVsdGFfbG9nX2xpaykgJT4lCiAgICAjIG11dGF0ZShkZWx0YV90ZXN0X21lYW4gPSBtZWFuX2RlbHRhX21zZSwKICAgICMgICAgICAgIGRlbHRhX3Rlc3Rfc2VtID0gc2VtX2RlbHRhX21zZSkKICAgIAogICAgIyBSZW1vdmUgdGhlIHJhdyBtZXRyaWNzLgogICAgc2VsZWN0KC1tZWFuX2RlbHRhX2xvZ19saWssIC1zZW1fZGVsdGFfbG9nX2xpaywKICAgICAgICAgICAjLW1lYW5fZGVsdGFfbXNlLCAtc2VtX2RlbHRhX21zZQogICAgICAgICAgICkKbW9kZWxfZGVsdGFzCmBgYAoKYGBge3J9CiMgU2FuaXR5IGNoZWNrOiB0cmFpbmluZyBvbiB0cmFpbit0ZXN0IGRhdGEgc2hvdWxkIHlpZWxkIGltcHJvdmVkIHBlcmZvcm1hbmNlIG92ZXIgdHJhaW5pbmcgb24ganVzdCB0cmFpbmluZyBkYXRhLiAoV2hlbiBldmFsdWF0aW5nIG9uIHRlc3QgZGF0YS4pCiMgZnVsbF9iYXNlbGluZXMgPSBhbGxfZGF0YSAlPiUKIyAgIGdyb3VwX2J5KG1vZGVsLCB0cmFpbmluZywgc2VlZCwgY29ycHVzKSAlPiUKIyAgIHN1bW1hcmlzZShiYXNlbGluZV90cmFpbl9hbGxfdGVzdF9saWsgPSBsb2dMaWtfdGVzdChsbShwc3ljaG9tZXRyaWMgfiBsZW4gKyBmcmVxICsgc2VudF9wb3MsIGRhdGE9LiksIHNlbWlfam9pbih0ZXN0X2RhdGEsIC4sIGJ5PWMoInRyYWluaW5nIiwgIm1vZGVsIiwgInNlZWQiLCAiY29ycHVzIikpLCBzZW1pX2pvaW4odGVzdF9kYXRhLCAuLCBieT1jKCJ0cmFpbmluZyIsICJtb2RlbCIsICJzZWVkIiwgImNvcnB1cyIpKSRwc3ljaG9tZXRyaWMpKSAlPiUKIyAgIHVuZ3JvdXAoKQojIGZ1bGxfYmFzZWxpbmVzCiMgCiMgZnVsbF9iYXNlbGluZXMgJT4lCiMgICByaWdodF9qb2luKGJhc2VsaW5lcywgYnk9Yygic2VlZCIsICJ0cmFpbmluZyIsICJtb2RlbCIsICJjb3JwdXMiKSkgJT4lCiMgICBtdXRhdGUoZGVsdGE9YmFzZWxpbmVfdHJhaW5fYWxsX3Rlc3RfbGlrLWJhc2VsaW5lX3Rlc3RfbGlrKSAlPiUKIyAgIHNlbGVjdCgtYmFzZWxpbmVfbGlrKSAjICU+JQojICAgI3NlbGVjdCgtYmFzZWxpbmVfdGVzdF9saWssIC1iYXNlbGluZV90cmFpbl9hbGxfdGVzdF9saWssIC1iYXNlbGluZV9saWssIC1iYXNlbGluZV90ZXN0X21zZSkKYGBgCgojIExvYWQgbGFuZ3VhZ2UgbW9kZWwgZGF0YSAoU3ludGF4R3ltLCBQUEwpCgpgYGB7cn0KbGFuZ3VhZ2VfbW9kZWxfZGF0YSA9IHJlYWQuY3N2KCIuLi9kYXRhL21vZGVsX21ldGFkYXRhLmNzdiIpICU+JQogIG11dGF0ZShtb2RlbCA9IGFzLmNoYXJhY3Rlcihtb2RlbCksCiAgICAgICAgIG1vZGVsID0gaWZfZWxzZShtb2RlbCA9PSAiZ3B0LTIiLCAiZ3B0MiIsIG1vZGVsKSwKICAgICAgICAgbW9kZWwgPSBhcy5mYWN0b3IobW9kZWwpKSAlPiUKICBtdXRhdGUodHJhaW5fc2l6ZSA9IGNhc2Vfd2hlbihzdHJfc3RhcnRzKHRyYWluaW5nLCAiYmxsaXAtbGciKSB+IDQyLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIHN0cl9zdGFydHModHJhaW5pbmcsICJibGxpcC1tZCIpIH4gMTUsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgc3RyX3N0YXJ0cyh0cmFpbmluZywgImJsbGlwLXNtIikgfiA1LAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIHN0cl9zdGFydHModHJhaW5pbmcsICJibGxpcC14cyIpIH4gMSksCiAgICAgICAgIAogICAgICAgICAjIFRyYWluaW5nIHZvY2FidWxhcnkgdXN1YWxseSBjb3ZhcmllcyB3aXRoIHRoZSB0cmFpbmluZyBjb3JwdXMuCiAgICAgICAgICMgQnV0IEJQRSBtb2RlbHMgc2hhcmUgYSB2b2NhYnVsYXJ5IGFjcm9zcyB0cmFpbmluZyBjb3Jwb3JhLgogICAgICAgICB0cmFpbmluZ192b2NhYj1hcy5mYWN0b3IoaWZlbHNlKHN0cl9kZXRlY3QodHJhaW5pbmcsICJncHRicGUiKSwgImdwdGJwZSIsIGFzLmNoYXJhY3Rlcih0cmFpbmluZykpKQogICAgICAgICApICU+JQogIG11dGF0ZShzZWVkID0gYXMuZmFjdG9yKHNlZWQpKSAlPiUKICBzZWxlY3QoLXBpZCwgLXRlc3RfbG9zcykgJT4lCiAgZGlzdGluY3QobW9kZWwsIHRyYWluaW5nLCBzZWVkLCAua2VlcF9hbGwgPSBUUlVFKQp0YWJsZShsYW5ndWFnZV9tb2RlbF9kYXRhJHNlZWQpCnRhYmxlKG1vZGVsX2RlbHRhcyRzZWVkKQpgYGAKCkZpcnN0IGpvaW4gZGVsdGEtbWV0cmljIGRhdGEgd2l0aCBtb2RlbCBhdXhpbGlhcnkgZGF0YS4KCmBgYHtyfQptb2RlbF9kZWx0YXMgPSBtb2RlbF9kZWx0YXMgJT4lCiAgbWVyZ2UobGFuZ3VhZ2VfbW9kZWxfZGF0YSwgYnkgPSBjKCJzZWVkIiwgInRyYWluaW5nIiwgIm1vZGVsIiksIGFsbD1UKSAlPiUKICBkcm9wX25hKCkKCm1vZGVsX2RlbHRhcwpgYGAKCkFsc28gam9pbiBvbiB0aGUgb3JpZ2luYWwgbGluZWFyIG1vZGVsIGRhdGEsIHJhdGhlciB0aGFuIGNvbGxhcHNpbmcgdG8gZGVsdGEtbWV0cmljcy4KVGhpcyB3aWxsIHN1cHBvcnQgcmVncmVzc2lvbnMgbGF0ZXIgb24gdGhhdCBkb24ndCBjb2xsYXBzZSBhY3Jvc3MgZm9sZHMuCgoKIyBGaW5hbCBkYXRhIHByZXByb2Nlc3NpbmcKCmBgYHtyIEZpbHRlciBtb2RlbHMgYW5kL29yIGNvcnBvcmF9CiMgRXhjbHVkZSBvcmRlcmVkLW5ldXJvbnMgZnJvbSBhbGwgYW5hbHlzZXMuCm1vZGVsX2RlbHRhcyA8LSBtb2RlbF9kZWx0YXMgJT4lCiAgZmlsdGVyKG1vZGVsICE9ICJvcmRlcmVkLW5ldXJvbnMiKQpgYGAKCgojIFZpc3VhbGl6YXRpb25zCgojIyBQcmVkaWN0aXZlIHBvd2VyIGFuZCBTRwoKCmBgYHtyIEJ5IG1vZGVsfQptb2RlbF9kZWx0YXMgJT4lCiAgZ2dwbG90KGFlcyh4PXNnX3Njb3JlLCB5PWRlbHRhX3Rlc3RfbWVhbikpICsKICAgIGdlb21fZXJyb3JiYXIoYWVzKHltaW49ZGVsdGFfdGVzdF9tZWFuLWRlbHRhX3Rlc3Rfc2VtLCB5bWF4PWRlbHRhX3Rlc3RfbWVhbitkZWx0YV90ZXN0X3NlbSkpICsKICAgIGdlb21fc21vb3RoKG1ldGhvZD0ibG0iLCBzZT1UKSArCiAgICBnZW9tX3BvaW50KHN0YXQ9ImlkZW50aXR5IiwgcG9zaXRpb249ImRvZGdlIiwgYWxwaGE9MSwgc2l6ZT0zLCBhZXMoY29sb3I9dHJhaW5pbmdfdm9jYWIsIHNoYXBlPW1vZGVsKSkgKwogICAgeWxhYihtZXRyaWMpICsKICAgIHhsYWIoIlN5bnRheCBHZW5lcmFsaXphdGlvbiBTY29yZSIpICsKICAgIGdndGl0bGUoIlN5bnRhY3RpYyBHZW5lcmFsaXphdGlvbiB2cy4gUHJlZGljdGl2ZSBQb3dlciIpICsKICAgIHNjYWxlX2NvbG9yX21hbnVhbCh2YWx1ZXMgPSBjKCJibGxpcC1sZyI9IiM0NDAxNTRGRiIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJibGxpcC1tZCI9IiMzOTU2OENGRiIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJibGxpcC1zbSI9IiMxRjk2OEJGRiIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJibGxpcC14cyI9IiM3M0QwNTVGRiIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJncHRicGUiPSIjODg4ODg4IikpICsKICAgIGZhY2V0X2dyaWQofmNvcnB1cywgc2NhbGVzPSJmcmVlIikgKwogICAgdGhlbWUoYXhpcy50ZXh0PWVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIHN0cmlwLnRleHQueCA9IGVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIGxlZ2VuZC50ZXh0PWVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIGF4aXMudGl0bGU9ZWxlbWVudF90ZXh0KHNpemU9MTgpLAogICAgICAgICAgbGVnZW5kLnBvc2l0aW9uID0gImJvdHRvbSIpCiNnZ3NhdmUoIi4vY29nc2NpX2ltYWdlcy9zZ19sb2dsaWsucG5nIixoZWlnaHQ9NSx3aWR0aD02KQpgYGAKCiMjIyBSZWdyZXNzaW9uIGFuYWx5c2VzCgpXZSBjb250cm9sIGZvciBlZmZlY3RzIG9mIHBlcnBsZXhpdHkgYnkgcmVsYXRpbmcgdGhlIHJlc2lkdWFscyBvZiBhIGBwZXJmb3JtYW5jZSB+IFBQTGAgcmVncmVzc2lvbiB0byBTRyBzY29yZS4KCmBgYHtyIFJlc2lkdWFsaXplZCByZWdyZXNzaW9ufQojIFByZXBhcmUgYSByZXNpZHVhbGl6ZWQgcmVncmVzc2lvbiBmb3IgeDEgb250byB5LCBjb250cm9sbGluZyBmb3IgdGhlIGVmZmVjdHMgb2YgeDIuCmRfcmVzaWQgPSBtb2RlbF9kZWx0YXMgJT4lCiAgZHJvcF9uYSgpICU+JQogIAogICMgUmVzaWR1YWxpemUgZGVsdGEgbWV0cmljIHcuci50IFBQTCBmb3IgZWFjaCBtb2RlbC0tdHJhaW5pbmctLXNlZWQKICBncm91cF9ieShjb3JwdXMpICU+JQogICAgbXV0YXRlKHJlc2lkLmRlbHRhID0gcmVzaWQobG0oZGVsdGFfdGVzdF9tZWFuIH4gdHJhaW5pbmc6dGVzdF9wcGwpKSkgJT4lCiAgdW5ncm91cCgpICU+JQogIAogICMgUmVzaWR1YWxpemUgU0cgc2NvcmUgdy5yLnQuIFBQTCBmb3IgZWFjaCB0cmFpbmluZyB2b2NhYnVsYXJ5CiAgZ3JvdXBfYnkodHJhaW5pbmdfdm9jYWIpICU+JQogICAgIyBOQiBubyBuZWVkIGZvciB0cmFpbmluZzpwcGwgaW50ZXJhY3Rpb24sIHNpbmNlIHdlJ3JlIHdpdGhpbi1ncm91cC4KICAgIG11dGF0ZShyZXNpZC5zZyA9IHJlc2lkKGxtKHNnX3Njb3JlIH4gdGVzdF9wcGwpKSkgJT4lCiAgdW5ncm91cCgpICU+JQogICMgQ29tcHV0ZSBzdW1tYXJ5IHN0YXRpc3RpY3MgYWNyb3NzIG1vZGVsLS10cmFpbmluZy0tc2VlZC0tY29ycHVzLgogIGdyb3VwX2J5KG1vZGVsLCB0cmFpbmluZ192b2NhYiwgY29ycHVzLCBzZWVkKSAlPiUKICAgIHN1bW1hcmlzZShyZXNpZC5kZWx0YS5tZWFuID0gbWVhbihyZXNpZC5kZWx0YSksCiAgICAgICAgICAgICAgcmVzaWQuZGVsdGEuc2VtID0gc2QocmVzaWQuZGVsdGEpIC8gc3FydChsZW5ndGgocmVzaWQuZGVsdGEpKSwKICAgICAgICAgICAgICByZXNpZC5zZy5tZWFuID0gbWVhbihyZXNpZC5zZyksCiAgICAgICAgICAgICAgcmVzaWQuc2cuc2VtID0gc2QocmVzaWQuc2cpIC8gc3FydChsZW5ndGgocmVzaWQuc2cpKSkKIyBOb3cgcGxvdCByZXNpZHVhbCB2cyBTRwpkX3Jlc2lkICU+JQogICNmaWx0ZXIoY29ycHVzICE9ICJibmMtYnJvd24iKSAlPiUKICBnZ3Bsb3QoYWVzKHg9cmVzaWQuc2cubWVhbiwgeT1yZXNpZC5kZWx0YS5tZWFuKSkgKwogICAgZ2VvbV9lcnJvcmJhcihhZXMoeG1pbj1yZXNpZC5zZy5tZWFuIC0gcmVzaWQuc2cuc2VtLAogICAgICAgICAgICAgICAgICAgICAgeG1heD1yZXNpZC5zZy5tZWFuICsgcmVzaWQuc2cuc2VtLAogICAgICAgICAgICAgICAgICAgICAgeW1pbj1yZXNpZC5kZWx0YS5tZWFuIC0gcmVzaWQuZGVsdGEuc2VtLAogICAgICAgICAgICAgICAgICAgICAgeW1heD1yZXNpZC5kZWx0YS5tZWFuICsgcmVzaWQuZGVsdGEuc2VtKSwgYWxwaGE9MC4zKSArCiAgICBnZW9tX3Ntb290aChtZXRob2Q9ImxtIiwgc2U9VCkgKwogICAgZ2VvbV9wb2ludChzdGF0PSJpZGVudGl0eSIsIHBvc2l0aW9uPSJkb2RnZSIsIGFscGhhPTEsIHNpemU9NCwgYWVzKHNoYXBlPW1vZGVsLCBjb2xvcj10cmFpbmluZ192b2NhYikpICsKICAgIHlsYWIocGFzdGUoIlJlc2lkdWFsIiwgbWV0cmljKSkgKwogICAgeGxhYigiUmVzaWR1YWwgU3ludGF4IEdlbmVyYWxpemF0aW9uIFNjb3JlIikgKwogICAgZ2d0aXRsZSgiU3ludGFjdGljIEdlbmVyYWxpemF0aW9uIHZzLiBQcmVkaWN0aXZlIFBvd2VyIikgKwogICAgc2NhbGVfY29sb3JfbWFudWFsKHZhbHVlcyA9IGMoImJsbGlwLWxnIj0iIzQ0MDE1NEZGIiwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJibGxpcC1tZCI9IiMzOTU2OENGRiIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAtc20iPSIjMUY5NjhCRkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgImJsbGlwLXhzIj0iIzczRDA1NUZGIiwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJncHRicGUiPSIjODg4ODg4IikpICsKICAgIGZhY2V0X2dyaWQoLn5jb3JwdXMsIHNjYWxlcz0iZnJlZSIpICsKICAgIHRoZW1lKGF4aXMudGV4dD1lbGVtZW50X3RleHQoc2l6ZT0xNCksCiAgICAgICAgICBzdHJpcC50ZXh0LnggPSBlbGVtZW50X3RleHQoc2l6ZT0xNCksCiAgICAgICAgICBsZWdlbmQudGV4dD1lbGVtZW50X3RleHQoc2l6ZT0xNCksCiAgICAgICAgICBheGlzLnRpdGxlPWVsZW1lbnRfdGV4dChzaXplPTE4KSwKICAgICAgICAgIGxlZ2VuZC5wb3NpdGlvbiA9ICJyaWdodCIpCmdnc2F2ZSgiLi4vaW1hZ2VzL2N1bnkyMDIwL3BwbF9zZy5wbmciLGhlaWdodD00LjUsd2lkdGg9MTEpCmBgYAoKCmBgYHtyIFN0ZXB3aXNlIHJlZ3Jlc3Npb259CmRvX3N0ZXB3aXNlX3JlZ3Jlc3Npb24gPSBmdW5jdGlvbihjdXJfY29ycHVzKSB7CiAgcmVncmVzc2lvbl9kYXRhID0gbW9kZWxfZGVsdGFzICU+JQogICAgZmlsdGVyKGNvcnB1cyA9PSBjdXJfY29ycHVzKQogIAogIHByaW50KCItLS0tLS0tLS0tLS0tLS0tLS0tLS0tIikKICBwcmludChjdXJfY29ycHVzKQogIAogIGxtMSA9IGxtKGRlbHRhX3Rlc3RfbWVhbiB+IHRyYWluaW5nX3ZvY2FiOnRlc3RfcHBsLCBkYXRhID0gcmVncmVzc2lvbl9kYXRhKQogIGxtMiA9IGxtKGRlbHRhX3Rlc3RfbWVhbiB+IHRyYWluaW5nX3ZvY2FiOnRlc3RfcHBsICsgc2dfc2NvcmUsIGRhdGEgPSByZWdyZXNzaW9uX2RhdGEpCiAgcHJpbnQoYW5vdmEobG0xLCBsbTIpKQogIHN1bW1hcnkobG0yKQp9CiNkb19zdGVwd2lzZV9yZWdyZXNzaW9uKCJibmMtYnJvd24iKQpkb19zdGVwd2lzZV9yZWdyZXNzaW9uKCJkdW5kZWUiKQpkb19zdGVwd2lzZV9yZWdyZXNzaW9uKCJuYXR1cmFsLXN0b3JpZXMiKQpgYGAKCiMjIFByZWRpY3RpdmUgcG93ZXIgYW5kIHBlcnBsZXhpdHkKCmBgYHtyfQptb2RlbF9kZWx0YXMgJT4lCiAgZ2dwbG90KGFlcyh4PXRlc3RfcHBsLCB5PWRlbHRhX3Rlc3RfbWVhbiwgY29sb3I9dHJhaW5pbmdfdm9jYWIpKSArCiAgICBnZW9tX2Vycm9yYmFyKGFlcyh5bWluPWRlbHRhX3Rlc3RfbWVhbi1kZWx0YV90ZXN0X3NlbSwgeW1heD1kZWx0YV90ZXN0X21lYW4rZGVsdGFfdGVzdF9zZW0pLCBhbHBoYT0wLjQpICsKICAgICNnZW9tX3Ntb290aChtZXRob2Q9ImxtIiwgc2U9RikgKwogICAgZ2VvbV9wb2ludChzdGF0PSJpZGVudGl0eSIsIHBvc2l0aW9uPSJkb2RnZSIsIGFscGhhPTEsIHNpemU9NCwgYWVzKHNoYXBlPW1vZGVsKSkgKwogICAgeWxhYihtZXRyaWMpICsKICAgIHhsYWIoIlRlc3QgUGVycGxleGl0eSIpICsKICAgICNjb29yZF9jYXJ0ZXNpYW4oeWxpbSA9IGMoMSwgMTYpKSArCiAgICBnZ3RpdGxlKCJUZXN0IFBlcnBsZXhpdHkgdnMuIFByZWRpY3RpdmUgUG93ZXIiKSArCiAgICBzY2FsZV9jb2xvcl9tYW51YWwodmFsdWVzID0gYygiYmxsaXAtbGciPSIjNDQwMTU0RkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgImJsbGlwLW1kIj0iIzM5NTY4Q0ZGIiwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJibGxpcC1zbSI9IiMxRjk2OEJGRiIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAteHMiPSIjNzNEMDU1RkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgImdwdGJwZSI9IiM4ODg4ODgiKSkgKwogICAgZmFjZXRfZ3JpZCh+Y29ycHVzLCBzY2FsZXM9ImZyZWUiKSArCiAgICAjY29vcmRfY2FydGVzaWFuKHlsaW0gPSBjKDAsIDE1MCkpICsKICAgIHRoZW1lKGF4aXMudGV4dD1lbGVtZW50X3RleHQoc2l6ZT0xMiksCiAgICAgICAgICBzdHJpcC50ZXh0LnggPSBlbGVtZW50X3RleHQoc2l6ZT0xMiksCiAgICAgICAgICBsZWdlbmQudGV4dD1lbGVtZW50X3RleHQoc2l6ZT0xMiksCiAgICAgICAgICBheGlzLnRpdGxlPWVsZW1lbnRfdGV4dChzaXplPTEyKSwKICAgICAgICAgIGxlZ2VuZC5wb3NpdGlvbiA9ICJyaWdodCIpCmdnc2F2ZSgiLi4vaW1hZ2VzL2N1bnkyMDIwL3BwbF9sb2dsaWsucG5nIixoZWlnaHQ9NC41LHdpZHRoPTExKQoKYGBgCgpgYGB7cn0KbW9kZWxfZGVsdGFzICU+JQogICNmaWx0ZXIobW9kZWwgIT0gIjVncmFtIiwgdHJhaW5pbmcgIT0gImJsbGlwLWxnIikgJT4lCiAgZ3JvdXBfYnkobW9kZWwsIGNvcnB1cykgJT4lCiAgICAjc3VtbWFyaXNlKG4gPSBuKCkpCiAgICBzdW1tYXJpc2UoY29yciA9IGFzLm51bWVyaWMoY29yLnRlc3QoZGVsdGFfdGVzdF9tZWFuLCB0ZXN0X3BwbClbNF0pLAogICAgICAgICAgICAgIHB2YWwgPSBhcy5udW1lcmljKGNvci50ZXN0KGRlbHRhX3Rlc3RfbWVhbiwgdGVzdF9wcGwpWzNdKSkKYGBgCgoKIyMgRWZmZWN0IG9mIHRyYWluaW5nIGRhdGEgc2l6ZQoKYGBge3IgT24gcHJlZGljdGl2ZSBwb3dlcn0KbW9kZWxfZGVsdGFzICU+JQogIG11dGF0ZSh0cmFpbl9zaXplID0gbG9nKHRyYWluX3NpemUpKSAlPiUKICBnZ3Bsb3QoYWVzKHg9dHJhaW5fc2l6ZSwgeT1kZWx0YV90ZXN0X21lYW4sIGNvbG9yPW1vZGVsKSkgKwogICAgZ2VvbV9lcnJvcmJhcihhZXMoeW1pbj1kZWx0YV90ZXN0X21lYW4tZGVsdGFfdGVzdF9zZW0sIHltYXg9ZGVsdGFfdGVzdF9tZWFuK2RlbHRhX3Rlc3Rfc2VtKSwgd2lkdGggPSAwLjEpICsKICAgIGdlb21fc21vb3RoKG1ldGhvZD0ibG0iLCBzZT1ULCBhbHBoYT0wLjUpICsKICAgIGdlb21fcG9pbnQoc3RhdD0iaWRlbnRpdHkiLCBwb3NpdGlvbj0iZG9kZ2UiLCBhbHBoYT0xLCBzaXplPTMpICsKICAgIHlsYWIobWV0cmljKSArCiAgICB4bGFiKCJMb2cgTWlsbGlvbiBUcmFpbmluZyBUb2tlbnMiKSArCiAgICBnZ3RpdGxlKCJUcmFpbmluZyBTaXplIHZzLiBQcmVkaWN0aXZlIFBvd2VyIikgKwogICAgZmFjZXRfZ3JpZChjb3JwdXN+bW9kZWwsIHNjYWxlcz0iZnJlZSIpICsKICAgICNzY2FsZV9jb2xvcl9tYW51YWwodmFsdWVzID0gYygiI0E0MkVGMSIsICIjMzg5NEM4IikpICsKICAgIHRoZW1lKGF4aXMudGV4dD1lbGVtZW50X3RleHQoc2l6ZT0xNCksCiAgICAgICAgICBzdHJpcC50ZXh0LnggPSBlbGVtZW50X3RleHQoc2l6ZT0xNCksCiAgICAgICAgICBsZWdlbmQudGV4dD1lbGVtZW50X3RleHQoc2l6ZT0xNCksCiAgICAgICAgICBheGlzLnRpdGxlPWVsZW1lbnRfdGV4dChzaXplPTE4KSwKICAgICAgICAgIGxlZ2VuZC5wb3NpdGlvbiA9ICJib3R0b20iKQojZ2dzYXZlKCIuL2NvZ3NjaV9pbWFnZXMvdHJhaW5pbmdfbG9nbGlrLnBuZyIsaGVpZ2h0PTUsd2lkdGg9NikKYGBgCgoKYGBge3IgT24gU0cgc2NvcmV9Cm1vZGVsX2RlbHRhcyAlPiUKICBtdXRhdGUodHJhaW5fc2l6ZSA9IGxvZyh0cmFpbl9zaXplKSkgJT4lCiAgZ2dwbG90KGFlcyh4PXRyYWluX3NpemUsIHk9c2dfc2NvcmUsIGNvbG9yPW1vZGVsKSkgKwogICAgZ2VvbV9zbW9vdGgobWV0aG9kPSJsbSIsIHNlPVQsIGFscGhhPTAuNSkgKwogICAgZ2VvbV9wb2ludChzdGF0PSJpZGVudGl0eSIsIHBvc2l0aW9uPSJkb2RnZSIsIGFscGhhPTEsIHNpemU9MykgKwogICAgeWxhYigiU0cgU0NvcmUiKSArCiAgICB4bGFiKCJMb2cgTWlsbGlvbiBUcmFpbmluZyBUb2tlbnMiKSArCiAgICBnZ3RpdGxlKCJUcmFpbmluZyBTaXplIHZzLiBTeW50YWN0aWMgR2VuZXJhbGl6YXRpb24iKSArCiAgICAjc2NhbGVfY29sb3JfbWFudWFsKHZhbHVlcyA9IGMoIiNBNDJFRjEiLCAiIzM4OTRDOCIpKSArCiAgICBmYWNldF9ncmlkKH5tb2RlbCwgc2NhbGVzPSJmcmVlIikgKwogICAgdGhlbWUoYXhpcy50ZXh0PWVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIHN0cmlwLnRleHQueCA9IGVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIGxlZ2VuZC50ZXh0PWVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIGF4aXMudGl0bGU9ZWxlbWVudF90ZXh0KHNpemU9MTgpLAogICAgICAgICAgbGVnZW5kLnBvc2l0aW9uID0gImJvdHRvbSIpCiNnZ3NhdmUoIi4vY29nc2NpX2ltYWdlcy90cmFpbmluZ19zZy5wbmciLGhlaWdodD01LHdpZHRoPTYpCmBgYAoKIyMgU21pdGggJiBMZXZ5IHJlcHJvZHVjdGlvbgoKYGBge3J9CiAgCmFsbF9kYXRhICU+JQogIGZpbHRlcihzdXJwcmlzYWwgPCAxNSwgc3VycHJpc2FsID4gMCkgJT4lCiAgZ2dwbG90KGFlcyh4PXN1cnByaXNhbCwgeT1wc3ljaG9tZXRyaWMsIGNvbG9yPXRyYWluaW5nKSkgKwogICAgc3RhdF9zbW9vdGgoc2U9VCwgYWxwaGE9MC41KSArCiAgICAjZ2VvbV9lcnJvcmJhcihjb2xvcj0iYmxhY2siLCB3aWR0aD0uMiwgcG9zaXRpb249cG9zaXRpb25fZG9kZ2Uod2lkdGg9LjkpLCBhbHBoYT0wLjMpICsKICAgICNnZW9tX3BvaW50KHN0YXQ9ImlkZW50aXR5IiwgcG9zaXRpb249ImRvZGdlIiwgYWxwaGE9MSwgc2l6ZT0zKSArCiAgICB5bGFiKCJQcm9jZXNzaW5nIFRpbWUgKG1zKSIpICsKICAgIHhsYWIoIlN1cnByaXNhbCAoYml0cykiKSArCiAgICBnZ3RpdGxlKCJTdXJwcmlzYWwgdnMuIFJlYWRpbmcgVGltZSAvIEdhemUgRHVyYXRpb24iKSArCiAgICBmYWNldF9ncmlkKGNvcnB1c35tb2RlbCwgc2NhbGVzID0gImZyZWUiKSArCiAgICBzY2FsZV9jb2xvcl9tYW51YWwodmFsdWVzID0gYygiYmxsaXAtbGciPSIjNDQwMTU0RkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAtbWQiPSIjMzk1NjhDRkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAtc20iPSIjMUY5NjhCRkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAteHMiPSIjNzNEMDU1RkYiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAtbGctZ3B0YnBlIj0iIzg4ODg4OCIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJibGxpcC1tZC1ncHRicGUiPSIjODg4ODg4IiwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgImJsbGlwLXNtLWdwdGJwZSI9IiM4ODg4ODgiLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiYmxsaXAteHMtZ3B0YnBlIj0iIzg4ODg4OCIpKSArCiAgICB0aGVtZShheGlzLnRleHQ9ZWxlbWVudF90ZXh0KHNpemU9MTQpLAogICAgICAgICAgYXhpcy50ZXh0LnkgPSBlbGVtZW50X3RleHQoc2l6ZSA9IDEwKSwKICAgICAgICAgIHN0cmlwLnRleHQueCA9IGVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIGxlZ2VuZC50ZXh0PWVsZW1lbnRfdGV4dChzaXplPTE0KSwKICAgICAgICAgIGF4aXMudGl0bGU9ZWxlbWVudF90ZXh0KHNpemU9MTgpLAogICAgICAgICAgbGVnZW5kLnBvc2l0aW9uID0gInJpZ2h0IikKZ2dzYXZlKCIuLi9pbWFnZXMvY3VueTIwMjAvc3VycF9jb3JyLnBuZyIsaGVpZ2h0PTQuNSx3aWR0aD0xMikKYGBgCg==